CU Amiga Super CD-ROM 24

home *** CD-ROM | disk | FTP | other *** search

/ CU Amiga Super CD-ROM 24 / CU Amiga Magazine's Super CD-ROM 24 (1998)(EMAP Images)(GB)(Track 1 of 2)[!][issue 1998-07].iso / CUCD / Programming / SWI / source / src / pl-index.c < prev next >

Wrap

C/C++ Source or Header | 1997-08-07 | 14.3 KB | 631 lines

/* $Id: pl-index.c,v 1.21 1997/08/07 07:58:08 jan Exp $ Copyright (c) 1990 Jan Wielemaker. All rights reserved. See ../LICENCE to find out about your rights. jan@swi.psy.uva.nl Purpose: indexing support */ #include "pl-incl.h" /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - Clause indexing. Clauses store an `index structure', which provides summary information on the unification behaviour of the clause (e.i. its head arguments. This structure consists of two words: a key and a varmask. Indexing can be done with upto 4 arguments. Both words are divided into the same number of bit groups as there are indexed arguments. If an argument is indexable (atom, integer or compound term), the corresponding bit group is filled with bits taken from the atom pointer, integer or functor pointer. In this case all corresponding bits in the varmask field are 1. Otherwise the bits in both the varmask and the key are all 0. To find a clause using indexing, we calculate an index structure from the calling arguments to the goal using the same rules. Now, we can do a mutual `and' using the varmasks on the keys and compare the result. If equal a good chance for a possible unification exists, otherwise unification will definitely fail. See matchIndex() and findClause(). Care has been taken to get this code as fast as possible, notably for indexing only on the first argument as this is default. - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */ /* 1 <= c <= 4 */ #define SHIFT(c, a) ((LONGBITSIZE/(c)) * a) #define MASK(c) (c == 1 ? ~0L : ((1L << (LONGBITSIZE/(c))) - 1)) #define VM(c, a) ((unsigned long)(~(MASK(c) << SHIFT(c, a)))) #define Shift(c, a) (mask_shift[c][a]) #define Mask(c) (mask_mask[c]) #define varMask(c, a) (variable_mask[c][a]) #define matchIndex(i1, i2) (((i1).key & (i2).varmask) ==\ ((i2).key & (i1).varmask)) static unsigned long variable_mask[][4] = { { 0, 0, 0, 0 }, #ifdef DONOT_AVOID_SHIFT_WARNING { VM(1, 0), 0, 0, 0 }, #else { (unsigned long)~0L, 0, 0, 0 }, #endif { VM(2, 0), VM(2, 1), 0, 0 }, { VM(3, 0), VM(3, 1), VM(3, 2), 0 }, { VM(4, 0), VM(4, 1), VM(4, 2), VM(4, 3) } }; static int mask_shift[][4] = { { 0, 0, 0, 0 }, { SHIFT(1, 0), 0, 0, 0 }, { SHIFT(2, 0), SHIFT(2, 1), 0, 0 }, { SHIFT(3, 0), SHIFT(3, 1), SHIFT(3, 2), 0 }, { SHIFT(4, 0), SHIFT(4, 1), SHIFT(4, 2), SHIFT(4, 3) } }; static unsigned long mask_mask[] = { 0, #ifdef DONOT_AVOID_SHIFT_WARNING MASK(1), #else 0L, #endif MASK(2), MASK(3), MASK(4) }; int cardinalityPattern(register unsigned long pattern) { register int result = 0; for(; pattern; pattern >>= 1) if (pattern & 0x1) result++; return result; } /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - Compute the index in the hash-array from a machine word and the number of buckets. This used to be simple, but now that our tag bits are on the left side, simply masking will put most things on the same hash-entry as it is very common for all clauses of a predicate to have the same type of object. Hence, we now use exclusive or of the real value part and the tag-bits. - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */ static inline int hashIndex(word key, int buckets) { unsigned long k = key >> LMASK_BITS; return (key^k) & (buckets-1); } static word indexOfWord(word w) { for(;;) { switch(tag(w)) { case TAG_VAR: case TAG_STRING: case TAG_FLOAT: return 0L; case TAG_INTEGER: if ( storage(w) != STG_INLINE ) return 0L; case TAG_ATOM: return w; case TAG_COMPOUND: return *valPtr(w); case TAG_REFERENCE: w = *unRef(w); continue; } } } void getIndex(register Word argv, register unsigned long pattern, int card, struct index *index) { if ( pattern == 0x1L ) { index->key = indexOfWord(*argv); index->varmask = (index->key ? (unsigned long) ~0L : 0L); return; } else { word key; int a; index->key = 0; index->varmask = (unsigned long) ~0L; /* all 1s */ for(a = 0; a < card; a++, pattern >>= 1, argv++) { for(;(pattern & 0x1) == 0; pattern >>= 1) argv++; key = indexOfWord(*argv); if ( !key ) { index->varmask &= varMask(card, a); } key = key ^ (key >> LMASK_BITS); /* see hashIndex() */ index->key |= ((key & Mask(card)) << Shift(card, a) ); } } return; } ClauseRef findClause(ClauseRef cref, Word argv, Definition def, bool *deterministic) { if ( def->indexPattern == 0x0L ) { noindex: for(;;cref = cref->next) { if ( cref ) { if ( false(cref->clause, ERASED) ) { *deterministic = !cref->next; return cref; } } else return NULL; } } else if ( def->indexPattern == 0x1L ) { word key = indexOfWord(*argv); if ( !key ) goto noindex; for(;cref ; cref = cref->next) { Clause clause = cref->clause; if ( (key & clause->index.varmask) == clause->index.key && false(clause, ERASED)) { ClauseRef result = cref; for( cref = cref->next; cref; cref = cref->next ) { clause = cref->clause; if ( (key&clause->index.varmask) == clause->index.key && false(clause, ERASED)) { *deterministic = FALSE; return result; } } *deterministic = TRUE; return result; } } return NULL; } else if ( def->indexPattern & NEED_REINDEX ) { reindexDefinition(def); return findClause(cref, argv, def, deterministic); } else { struct index argIndex; getIndex(argv, def->indexPattern, def->indexCardinality, &argIndex); for(; cref; cref = cref->next) { if ( matchIndex(argIndex, cref->clause->index) && false(cref->clause, ERASED)) { ClauseRef result = cref; for( cref = cref->next; cref; cref = cref->next ) { if ( matchIndex(argIndex, cref->clause->index) && false(cref->clause, ERASED)) { *deterministic = FALSE; return result; } } *deterministic = TRUE; return result; } } return NULL; } } static ClauseRef nextClause(ClauseRef cref, bool *det, Index ctx) { if ( ctx->varmask == ~0x0L ) /* first argument only */ { word key = ctx->key; for(;cref ; cref = cref->next) { Clause clause = cref->clause; if ( (key & clause->index.varmask) == clause->index.key && false(clause, ERASED)) { ClauseRef result = cref; for( cref = cref->next; cref; cref = cref->next ) { clause = cref->clause; if ( (key&clause->index.varmask) == clause->index.key && false(clause, ERASED)) { *det = FALSE; return result; } } *det = TRUE; return result; } } } else if ( ctx->varmask == 0x0L ) /* no indexing */ { for(; cref; cref = cref->next) { if ( false(cref->clause, ERASED) ) { *det = !cref->next; return cref; } } } else /* general (multi-arg) indexing */ { for(; cref; cref = cref->next) { if ( matchIndex(*ctx, cref->clause->index) && false(cref->clause, ERASED)) { ClauseRef result = cref; for( cref = cref->next; cref; cref = cref->next ) { if ( matchIndex(*ctx, cref->clause->index) && false(cref->clause, ERASED)) { *det = FALSE; return result; } } *det = TRUE; return result; } } } return NULL; } static ClauseRef firstClause(Word argv, Definition def, bool *det) { ClauseRef cref; struct index buf; Index ctx = &buf; again: if ( def->indexPattern == 0x0L ) { noindex: for(cref = def->definition.clauses; cref; cref = cref->next) { if ( false(cref->clause, ERASED) ) { *det = !cref->next; return cref; } } return NULL; } else if ( def->indexPattern == 0x1L ) { word key = indexOfWord(*argv); if ( key == 0L ) goto noindex; ctx->key = key; ctx->varmask = (unsigned long) ~0x0L; if ( def->hash_info ) { int hi = hashIndex(key, def->hash_info->buckets); cref = def->hash_info->entries[hi].head; } else cref = def->definition.clauses; } else if ( def->indexPattern & NEED_REINDEX ) { reindexDefinition(def); goto again; } else { getIndex(argv, def->indexPattern, def->indexCardinality, ctx); cref = def->definition.clauses; } return nextClause(cref, det, ctx); } /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - Recalculate the index of a clause after the index pattern on the predicate has been changed. The head of the clause is decompiled. The resulting term is simply discarded as it cannot have links to any other part of the stacks (e.g. backtrailing is not needed). - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */ bool reindexClause(Clause clause) { Procedure proc = clause->procedure; unsigned long pattern = proc->definition->indexPattern; if ( pattern == 0x0 ) succeed; if ( false(clause, ERASED) ) { fid_t fid = PL_open_foreign_frame(); if ( pattern == 0x1 ) /* the 99.9% case. Speedup a little */ { word key; if ( arg1Key(clause, &key) ) { clause->index.key = key; clause->index.varmask = (unsigned long)~0L; } else { clause->index.key = 0L; clause->index.varmask = 0L; } } else { term_t head = PL_new_term_ref(); decompileHead(clause, head); getIndex(argTermP(*valTermRef(head), 0), pattern, proc->definition->indexCardinality, &clause->index); } PL_discard_foreign_frame(fid); } succeed; } bool unify_index_pattern(Procedure proc, term_t value) { Definition def = proc->definition; unsigned long pattern = (def->indexPattern & ~NEED_REINDEX); int n, arity = def->functor->arity; if ( pattern == 0 ) fail; if ( PL_unify_functor(value, def->functor->functor) ) { term_t a = PL_new_term_ref(); for(n=0; n<arity; n++, pattern >>= 1) { if ( !PL_get_arg(n+1, value, a) || !PL_unify_integer(a, (pattern & 0x1) ? 1 : 0) ) fail; } succeed; } fail; } /******************************* * HASH SUPPORT * *******************************/ static ClauseIndex newClauseIndexTable(int buckets) { ClauseIndex ci = allocHeap(sizeof(struct clause_index)); ClauseChain ch; int m = 4; while(m<buckets) m *= 2; buckets = m; ci->buckets = buckets; ci->size = 0; ci->alldirty = FALSE; ci->entries = allocHeap(sizeof(struct clause_chain) * buckets); for(ch = ci->entries; buckets; buckets--, ch++) { ch->head = ch->tail = NULL; ch->dirty = 0; } return ci; } void unallocClauseIndexTable(ClauseIndex ci) { ClauseChain ch; int buckets = ci->buckets; for(ch = ci->entries; buckets; buckets--, ch++) { ClauseRef cr, next; for(cr = ch->head; cr; cr = next) { next = cr->next; freeHeap(cr, sizeof(*cr)); } } freeHeap(ci->entries, ci->buckets * sizeof(struct clause_chain)); freeHeap(ci, sizeof(struct clause_index)); } static void appendClauseChain(ClauseChain ch, Clause cl, int where) { ClauseRef cr = newClauseRef(cl); if ( !ch->tail ) ch->head = ch->tail = cr; else { if ( where != CL_START ) { ch->tail->next = cr; ch->tail = cr; } else { cr->next = ch->head; ch->head = cr; } } } static void deleteClauseChain(ClauseChain ch, Clause clause) { ClauseRef prev = NULL; ClauseRef c; for(c = ch->head; c; prev = c, c = c->next) { if ( c->clause == clause ) { if ( !prev ) { ch->head = c->next; if ( !c->next ) ch->tail = NULL; } else { prev->next = c->next; if ( !c->next) ch->tail = prev; } } } } static int gcClauseChain(ClauseChain ch, int dirty) { ClauseRef cref = ch->head, prev = NULL; int deleted = 0; while( cref && dirty ) { if ( true(cref->clause, ERASED) ) { ClauseRef c = cref; if ( c->clause->index.varmask != 0 ) /* indexed and only in this */ deleted++; /* chain */ dirty--; cref = cref->next; if ( !prev ) { ch->head = c->next; if ( !c->next ) ch->tail = NULL; } else { prev->next = c->next; if ( c->next == NULL) ch->tail = prev; } freeClauseRef(c); } else { prev = cref; cref = cref->next; } } ch->dirty = 0; return deleted; } #define INFINT (~(1<<(INTBITSIZE-1))) void gcClauseIndex(ClauseIndex ci) { ClauseChain ch = ci->entries; int n = ci->buckets; if ( ci->alldirty ) { for(; n; n--, ch++) ci->size -= gcClauseChain(ch, INFINT); } else { for(; n; n--, ch++) { if ( ch->dirty ) ci->size -= gcClauseChain(ch, ch->dirty); } } } void markDirtyClauseIndex(ClauseIndex ci, Clause cl) { if ( cl->index.varmask == 0 ) ci->alldirty = TRUE; else { int hi = hashIndex(cl->index.key, ci->buckets); ci->entries[hi].dirty++; } } void addClauseToIndex(Definition def, Clause cl, int where) { ClauseIndex ci = def->hash_info; ClauseChain ch = ci->entries; if ( cl->index.varmask == 0 ) /* a non-indexable field */ { int n = ci->buckets; for(; n; n--, ch++) appendClauseChain(ch, cl, where); } else { int hi = hashIndex(cl->index.key, ci->buckets); DEBUG(2, Sdprintf("Storing in bucket %d\n", hi)); appendClauseChain(&ch[hi], cl, where); if ( ++ci->size / 2 > ci->buckets ) { enterDefinition(def); set(def, NEEDSREHASH); leaveDefinition(def); } } } void delClauseFromIndex(ClauseIndex ci, Clause cl) { ClauseChain ch = ci->entries; if ( cl->index.varmask == 0 ) /* a non-indexable field */ { int n = ci->buckets; for(; n; n--, ch++) deleteClauseChain(ch, cl); } else { int hi = hashIndex(cl->index.key, ci->buckets); deleteClauseChain(&ch[hi], cl); ci->size--; } } bool hashDefinition(Definition def, int buckets) { ClauseRef cref; if ( true(def, FOREIGN) ) fail; if ( def->indexPattern != 0x1 ) fail; def->hash_info = newClauseIndexTable(buckets); for(cref = def->definition.clauses; cref; cref = cref->next) addClauseToIndex(def, cref->clause, CL_END); succeed; } word pl_hash(term_t pred) { Procedure proc; if ( get_procedure(pred, &proc, 0, GP_CREATE) ) { Definition def = proc->definition; if ( false(def, FOREIGN) && def->indexPattern & NEED_REINDEX ) reindexDefinition(def); return hashDefinition(def, 256); } fail; }